#!/bin/bash
#SBATCH --job-name=tlggnv1
#SBATCH --nodes=1
#SBATCH -n 16
#SBATCH --gres=gpu:2
#SBATCH --output=logs/tlggnv1/1.log
#SBATCH -p a30
#SBATCH --nodelist=a30c08

source /share/home/22351121/anaconda3/etc/profile.d/conda.sh
source activate Mevis
export NCCL_IB_DISABLE=1

NUM_GPUS=2
DIST_URL=10.82.8.19
NNODES=2
NODE_RANK=1

python3 -m torch.distributed.launch --nproc_per_node $NUM_GPUS --nnodes $NNODES --node_rank $NODE_RANK --master_port 13325 --master_addr $DIST_URL --use_env \
    train.py \
    --with_box_refine \
    "--dataset_file" mevisv1 \
    --binary \
    --batch_size 1 \
    --me tlggnv1 \
    --epochs 3 \
    --lr_drop 2 \
    --lr 0.00005 \
    --lr_backbone 0.000006 \
    --weight_decay  0.05 \
    --num_frames 5 \
    --backbone video_swin_t_p4w7 \
    --backbone_pretrained ./weights/swin_tiny_patch244_window877_kinetics400_1k.pth \
    --output_dir ./results/tlggnv1
